{
    "trainer": {
        "evaluation_strategy": "steps",
        "per_device_train_batch_size": 1,
        "per_device_eval_batch_size": 2,
        "gradient_accumulation_steps": 32,
        "eval_steps": 150,
        "save_steps": 150,
        "logging_steps": 10,
        "learning_rate": 0.0003,
        "num_train_epochs": 3,
        "lr_scheduler_type": "cosine",
        "warmup_steps": 100,
        "fp16": false,
        "bf16": false,
        "torch_compile": false,
        "optim": "adamw_torch"
    },
    "lora": {
        "r": 4,
        "lora_alpha": 32,
        "lora_dropout": 0.02,
        "inference_mode": false,
        "task_type": "SEQ_2_SEQ_LM"
    },
    "load_in_8bit": true,
    "model_name": "bigscience/mt0-xxl-mt",
    "model_type": "seq2seq",
    "template_category": "seq2seq_no_newlines",
    "max_source_tokens_count": 400,
    "max_target_tokens_count": 400
}

